\relax 
\citation{mendez2014climate}
\citation{muller2019escape}
\citation{noauthor_sve_nodate}
\citation{schulthess2018reflecting}
\citation{bauer_digital_2021}
\citation{schar2020kilometer,lapillonne2017using}
\@writefile{toc}{\contentsline {title}{Auto-CLOUDSC: An Auto-generation Framework for Vectorization and Optimization of Cloud Microphysics Parameterization on ARM CPUs}{1}{}\protected@file@percent }
\@writefile{toc}{\authcount {8}}
\@writefile{toc}{\contentsline {author}{ Tun Chen \and Jianping Wu\unskip {} \and Yuntian Zheng\and Yingjie Wang\and Fukang Yin\and Jinhui Yang\and Juan Zhao\and Xiaoli Ren }{1}{}\protected@file@percent }
\@writefile{toc}{\contentsline {section}{\numberline {1}Introduction}{1}{}\protected@file@percent }
\citation{ecmwf_ifs_2023}
\citation{noauthor_ecmwf-ifsdwarf-p-CLOUDSC_2025}
\citation{allen1987automatic,hampton2008compiling,kennedy2001optimizing}
\citation{song1999new,coleman1995tile}
\citation{wolf1991loop,mckinley1996improving}
\citation{ubbiali2024exploring,hague_ifs_2014}
\citation{fang2021performance,gao2023wrbench}
\@writefile{toc}{\contentsline {section}{\numberline {2}Auto-CLOUDSC: Auto-generation Architecture}{3}{}\protected@file@percent }
\newlabel{sec:Auto-CLOUDSC}{{2}{3}{}{section.2}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.1}Function Interface Generator}{3}{}\protected@file@percent }
\@writefile{lof}{\contentsline {figure}{\numberline {1}{\ignorespaces Auto-Generator Workflow}}{4}{}\protected@file@percent }
\newlabel{fig:auto-sve-arch}{{1}{4}{}{figure.1}{}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {1}{\ignorespaces Vars\_in\_out\_tmp for Parameter Type Identification}}{5}{}\protected@file@percent }
\newlabel{alg:vars_in_out_tmp}{{1}{5}{}{algorithm.1}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2}Code Structure Analyzer}{6}{}\protected@file@percent }
\@writefile{toc}{\contentsline {subsubsection}{Loop Transformation}{6}{}\protected@file@percent }
\@writefile{toc}{\contentsline {subsubsection}{Parallelization Level Determination}{6}{}\protected@file@percent }
\newlabel{equ:V}{{1}{6}{}{equation.1}{}}
\@writefile{toc}{\contentsline {subsubsection}{Generation of Predicate}{6}{}\protected@file@percent }
\@writefile{toc}{\contentsline {paragraph}{Predicate for Loop Structure}{6}{}\protected@file@percent }
\@writefile{loa}{\contentsline {algorithm}{\numberline {2}{\ignorespaces Vectorized and Scalar Loops}}{7}{}\protected@file@percent }
\newlabel{alg:vectorized_scalar_loops}{{2}{7}{}{algorithm.2}{}}
\newlabel{equ:svwhilelt}{{2}{7}{}{equation.2}{}}
\@writefile{toc}{\contentsline {paragraph}{Predicate for Branch Structure}{7}{}\protected@file@percent }
\@writefile{toc}{\contentsline {subsection}{\numberline {2.3}Expression Parser}{7}{}\protected@file@percent }
\@writefile{loa}{\contentsline {algorithm}{\numberline {3}{\ignorespaces Expression Analysis: \\ Example of $E = \mathrm  {MAX}(A+B, \mathrm  {MIN}(C, \mathrm  {EXP}(D^2)))$}}{8}{}\protected@file@percent }
\newlabel{alg:expression_analysis}{{3}{8}{}{algorithm.3}{}}
\newlabel{equ:Extract}{{3}{8}{}{equation.3}{}}
\@writefile{toc}{\contentsline {section}{\numberline {3}Optimization of Loop Transformations}{9}{}\protected@file@percent }
\newlabel{sec:loop_opt}{{3}{9}{}{section.3}{}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {4}{\ignorespaces Comparison of Parallel Grid Computing Structures}}{10}{}\protected@file@percent }
\newlabel{alg:grid_computing_comparison}{{4}{10}{}{algorithm.4}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.1}Physics-combine Algorithm in the Temporal Dimension}{10}{}\protected@file@percent }
\@writefile{lof}{\contentsline {figure}{\numberline {2}{\ignorespaces Vectorized parallel computation for physical-process parameterization}}{11}{}\protected@file@percent }
\newlabel{fig:vector}{{2}{11}{}{figure.2}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.2}Cache-Aware Algorithm in the Spatial Dimension}{11}{}\protected@file@percent }
\newlabel{formu:cache_aware}{{4}{11}{}{equation.4}{}}
\citation{noauthor_ecmwf-ifsdwarf-p-CLOUDSC_2025}
\@writefile{lot}{\contentsline {table}{\numberline {1}{\ignorespaces Experimental Environment}}{12}{}\protected@file@percent }
\newlabel{tab:Environment_FT2000}{{1}{12}{}{table.1}{}}
\newlabel{formu:nb_condition}{{5}{12}{}{equation.5}{}}
\@writefile{toc}{\contentsline {section}{\numberline {4}Performance Evaluation}{12}{}\protected@file@percent }
\newlabel{sec:Perf-Evaluation}{{4}{12}{}{section.4}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.1}Setup}{12}{}\protected@file@percent }
\@writefile{toc}{\contentsline {subsection}{\numberline {4.2}Performance Analysis}{13}{}\protected@file@percent }
\citation{noauthor_ecmwf-ifsloki_2025}
\citation{clement2019automatic}
\citation{1055553175812}
\citation{dagum_openmp_1998}
\citation{dahm2023pace}
\@writefile{lot}{\contentsline {table}{\numberline {2}{\ignorespaces Speedup of Vector, Loop and Loop\_Vector methods over Baseline for different input sizes (ngptot) and block sizes (npromas).}}{14}{}\protected@file@percent }
\newlabel{tab:speedup_FT2000}{{2}{14}{}{table.2}{}}
\@writefile{lof}{\contentsline {figure}{\numberline {3}{\ignorespaces Execution time of the baseline, the Vector, the Loop and the Loop\_Vector version}}{15}{}\protected@file@percent }
\newlabel{fig:Time_vs_npromas_Size_multi_bigfont}{{3}{15}{}{figure.3}{}}
\@writefile{toc}{\contentsline {section}{\numberline {5}Related Work}{15}{}\protected@file@percent }
\newlabel{sec:Related-Work}{{5}{15}{}{section.5}{}}
\citation{harris2020array,afanasyev2021gridtools,ben2019stateful}
\citation{harris2020array}
\citation{afanasyev2021gridtools}
\citation{ben2019stateful}
\citation{martin2023dace}
\citation{ubbiali2024exploring}
\citation{beazley_david_nodate}
\citation{fang2021performance,xia2021kunpeng,sato2020co}
\bibstyle{splncs04}
\bibdata{Cmm}
\bibcite{noauthor_sve_nodate}{1}
\@writefile{toc}{\contentsline {section}{\numberline {6}Conclusion}{17}{}\protected@file@percent }
\newlabel{sec:Conclusion}{{6}{17}{}{section.6}{}}
\bibcite{noauthor_ecmwf-ifsdwarf-p-CLOUDSC_2025}{2}
\bibcite{noauthor_ecmwf-ifsloki_2025}{3}
\bibcite{afanasyev2021gridtools}{4}
\bibcite{allen1987automatic}{5}
\bibcite{bauer_digital_2021}{6}
\bibcite{beazley_david_nodate}{7}
\bibcite{ben2019stateful}{8}
\bibcite{1055553175812}{9}
\bibcite{clement2019automatic}{10}
\bibcite{coleman1995tile}{11}
\bibcite{dagum_openmp_1998}{12}
\bibcite{dahm2023pace}{13}
\bibcite{ecmwf_ifs_2023}{14}
\bibcite{fang2021performance}{15}
\bibcite{gao2023wrbench}{16}
\bibcite{hague_ifs_2014}{17}
\bibcite{hampton2008compiling}{18}
\bibcite{harris2020array}{19}
\bibcite{kennedy2001optimizing}{20}
\bibcite{lapillonne2017using}{21}
\bibcite{martin2023dace}{22}
\bibcite{mckinley1996improving}{23}
\bibcite{mendez2014climate}{24}
\bibcite{muller2019escape}{25}
\bibcite{sato2020co}{26}
\bibcite{schar2020kilometer}{27}
\bibcite{schulthess2018reflecting}{28}
\bibcite{song1999new}{29}
\bibcite{ubbiali2024exploring}{30}
\bibcite{wolf1991loop}{31}
\bibcite{xia2021kunpeng}{32}
\gdef \@abspage@last{19}
